package com.fengzhi.crawler.jsoup.parser.impl;

import java.util.Set;

import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;

public interface BasicParser {

	/**
	 * 
	 * @Title: denoiseForDoc
	 * @Description: TODO(对Document进行降噪)
	 * @author fyf
	 * @param document
	 * @return
	 */
	public Document denoiseForDoc(Document document);

	/**
	 * 
	 * @Title: getImgUrl
	 * @Description: TODO(获取图片地址)
	 * @author fyf
	 * @param element
	 */
	public Set<String> getImgUrl(Element element);

	/**
	 * 
	 * @Title: getLinks
	 * @Description: TODO(获取当前页面中所有链接)
	 * @author fyf
	 * @param contentElement
	 * @return
	 */
	public Set<String> getLinks(Element contentElement);

}
